# encoding: utf-8
# 用于生成识别数据集的字母表
lexiconPath = r'F:\laibo\Data\CRNN_data\AllCRNNTestList\lexicon.txt'
alphabet = set()
with open(lexiconPath, 'r', encoding='utf-8') as f:
    lines = f.readlines()
    for line in lines:
        print(line.strip())
        for char in line.strip():
            alphabet.add(char)
print(f'本数据集共有{len(alphabet)}个不同字符，分别是{alphabet}')
print(''.join(alphabet))
